@inproceedings{joint,
abstract = {We introduce the joint time-frequency scattering transform, a time shift invariant descriptor of time-frequency structure for audio classification. It is obtained by applying a two-dimensional wavelet transform in time and log-frequency to a time-frequency wavelet scalogram. We show that this descriptor successfully characterizes complex time-frequency phenomena such as time-varying filters and frequency modulated excitations. State-of-the-art results are achieved for signal reconstruction and phone segment classification on the TIMIT dataset.},
author = {And{\'{e}}n, Joakim and Lostanlen, Vincent and Mallat, St{\'{e}}phane},
booktitle = {Proc. MLSP},
title = {{Joint time-frequency scattering for audio classification}},
year = {2015}
}

@article{stephane,
  title={Group invariant scattering},
  author={Mallat, St{\'e}phane},
  journal={Communications on Pure and Applied Mathematics},
  volume={65},
  number={10},
  pages={1331--1398},
  year={2012},
  publisher={Wiley Online Library}
}

@article{joan,
  title={Invariant scattering convolution networks},
  author={Bruna, Joan and Mallat, St{\'e}phane},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={35},
  number={8},
  pages={1872--1886},
  year={2013},
  publisher={IEEE}
}

@article{dss,
  title={Deep scattering spectrum},
  author={And{\'e}n, Joakim and Mallat, St{\'e}phane},
  journal={IEEE Transactions on Signal Processing},
  volume={62},
  number={16},
  pages={4114--4128},
  year={2014},
  publisher={IEEE}
}

@article{embs,
  title={Scattering transform for intrapartum fetal heart rate variability fractal analysis: A case-control study},
  author={Chud{\'a}{\v{c}}ek, V{\'a}clav and And{\'e}n, Joakim and Mallat, St{\'e}phane and Abry, Patrice and Doret, Muriel},
  journal={IEEE Transactions on Biomedical Engineering},
  volume={61},
  number={4},
  pages={1100--1108},
  year={2014},
  publisher={IEEE}
}

@article{davis-mermelstein,
  title={Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences},
  author={Davis, Steven and Mermelstein, Paul},
  journal={IEEE transactions on acoustics, speech, and signal processing},
  volume={28},
  number={4},
  pages={357--366},
  year={1980},
  publisher={IEEE}
}

@inproceedings{atlas,
  title={Scalable and progressive audio codec},
  author={Vinton, Mark S and Atlas, Les E},
  booktitle={Acoustics, Speech, and Signal Processing, 2001. Proceedings.(ICASSP'01). 2001 IEEE International Conference on},
  volume={5},
  pages={3277--3280},
  year={2001},
  organization={IEEE}
}

@inproceedings{hermansky,
	Title={The modulation spectrum in the automatic recognition of speech},
	Author={Hermansky, H.},
	Booktitle={Proc. IEEE ASRU},
	Year={1997},
	Pages={140--147}}


@inproceedings{ellis-mcdermott,
    Author = {D.P.W. Ellis and Xiaohong Zeng and J.H. McDermott},
    Booktitle = {Proc. IEEE ICASSP},
    Title = {Classifying soundtracks with audio texture features},
    Pages = {5880--5883},
    Year = {2011},
        Address = {Prague, Czech Republic},
        Month = {May. 22-27}}

@inproceedings{thompson2003non,
  title={A non-uniform modulation transform for audio coding with increased time resolution},
  author={Thompson, Jeffrey K and Atlas, Les E},
  booktitle={Acoustics, Speech, and Signal Processing, 2003. Proceedings.(ICASSP'03). 2003 IEEE International Conference on},
  volume={5},
  pages={V--397},
  year={2003},
  organization={IEEE}
}

@article{vapnik,
  title={Support-vector networks},
  author={Cortes, Corinna and Vapnik, Vladimir},
  journal={Machine learning},
  volume={20},
  number={3},
  pages={273--297},
  year={1995},
  publisher={Springer}
}

@article{liblinear,
  title={{LIBLINEAR}: A library for large linear classification},
  author={Fan, Rong-En and Chang, Kai-Wei and Hsieh, Cho-Jui and Wang, Xiang-Rui and Lin, Chih-Jen},
  journal={Journal of machine learning research},
  volume={9},
  number={Aug},
  pages={1871--1874},
  year={2008}
}

@article{kittler,
  title={On combining classifiers},
  author={Kittler, Josef and Hatef, Mohamad and Duin, Robert PW and Matas, Jiri},
  journal={IEEE transactions on pattern analysis and machine intelligence},
  volume={20},
  number={3},
  pages={226--239},
  year={1998},
  publisher={IEEE}
}

@inproceedings{heittola,
  title={{TUT} Database for Acoustic Scene Classification and Sound Event Detection},
  author={Mesaros, Annamaria and Heittola, Toni and Virtanen, Tuomas},
  booktitle={24rd European Signal Processing Conference 2016 (EUSIPCO 2016)},
  year={2016},
  address={Budapest, Hungary}
}

@book{Fastl2007,
archivePrefix = {arXiv},
arxivId = {arXiv:1011.1669v3},
author = {Fastl, Hugo and Zwicker, Eberhard},
booktitle = {Psychoacoustics: Facts and Models},
doi = {10.1007/978-3-540-68888-4},
eprint = {arXiv:1011.1669v3},
isbn = {3540231595},
issn = {1098-6596},
pages = {1--463},
pmid = {25246403},
title = {{Psychoacoustics: Facts and models, chapter 4}},
url = {http://zhenilo.narod.ru/new{\_}main/students/Zwicker{\_}Fastl.pdf},
year = {2007}
}

@book{Wang2006,
 author = {Wang, DeLiang and Brown, Guy J.},
 title = {Computational Auditory Scene Analysis: Principles, Algorithms, and Applications},
 year = {2006},
 isbn = {0471741094},
 publisher = {Wiley-IEEE Press}}

 @book{Blauert2004,
     address = {Cambridge, MA, USA},
     author = {Blauert, Jens},
     publisher = {The {MIT} Press},
     title = {{Spatial Hearing: The psychophysics of human sound localization (revised edition)}},
     year = {2004}
 }
